@inproceedings{giordano2024tinyforge,
  title={TinyForge: A Design Space Exploration to Advance Energy and Silicon Area Trade-offs in tinyML Compute Architectures with Custom Latch Arrays},
  author={Giordano, Massimo and Doshi, Rohan and Lu, Qianyun and Murmann, Boris},
  booktitle={Proceedings of the 29th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 3},
  pages={1033--1047},
  year={2024}
}
@article{sun2023efficient,
  title={Efficient Processing of MLPerf Mobile Workloads Using Digital Compute-In-Memory Macros},
  author={Sun, Xiaoyu and Cao, Weidong and Crafton, Brian and Akarvardar, Kerem and Mori, Haruki and Fujiwara, Hidehiro and Noguchi, Hiroki and Chih, Yu-Der and Chang, Meng-Fan and Wang, Yih and others},
  journal={IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems},
  year={2023},
  publisher={IEEE}
}
@inproceedings{chen2024bbs,
  title={BBS: Bi-directional bit-level sparsity for deep learning acceleration},
  author={Chen, Yuzong and Meng, Jian and Seo, Jae-sun and Abdelfattah, Mohamed S},
  booktitle={2024 57th IEEE/ACM International Symposium on Microarchitecture (MICRO)},
  pages={551--564},
  year={2024},
  organization={IEEE}
}
@article{wu2023fedcomp,
  title={FedComp: A Federated Learning Compression Framework for Resource-Constrained Edge Computing Devices},
  author={Wu, Donglei and Yang, Weihao and Jin, Haoyu and Zou, Xiangyu and Xia, Wen and Fang, Binxing},
  journal={IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems},
  year={2023},
  publisher={IEEE}
}
@article{kong2023edgecompress,
  title={EdgeCompress: Coupling Multidimensional Model Compression and Dynamic Inference for EdgeAI},
  author={Kong, Hao and Liu, Di and Huai, Shuo and Luo, Xiangzhong and Subramaniam, Ravi and Makaya, Christian and Lin, Qian and Liu, Weichen},
  journal={IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems},
  volume={42},
  number={12},
  pages={4657--4670},
  year={2023},
  publisher={IEEE}
}
@article{jiang2022high,
  title={A high-throughput full-dataflow mobilenetv2 accelerator on edge FPGA},
  author={Jiang, Weixiong and Yu, Heng and Ha, Yajun},
  journal={IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems},
  volume={42},
  number={5},
  pages={1532--1545},
  year={2022},
  publisher={IEEE}
}

@article{lin2022device,
  title={On-device training under 256kb memory},
  author={Lin, Ji and Zhu, Ligeng and Chen, Wei-Ming and Wang, Wei-Chen and Gan, Chuang and Han, Song},
  journal={Advances in Neural Information Processing Systems},
  volume={35},
  pages={22941--22954},
  year={2022}
}
@article{zheng2024streamnet,
  title={StreamNet: memory-efficient streaming tiny deep learning inference on the microcontroller},
  author={Zheng, Hong-Sheng and Liu, Yu-Yuan and Hsu, Chen-Fong and Yeh, Tsung Tai},
  journal={Advances in Neural Information Processing Systems},
  volume={36},
  year={2024}
}
@article{zhao2024sal,
  title={SAL: Optimizing the Dataflow of Spin-based Architectures for Lightweight Neural Networks},
  author={Zhao, Yunping and Ma, Sheng and Liu, Hengzhu and Li, Dongsheng},
  journal={ACM Transactions on Architecture and Code Optimization},
  year={2024},
  publisher={ACM New York, NY}
}
@article{lee2024resa,
  title={ReSA: Reconfigurable Systolic Array for Multiple Tiny DNN Tensors},
  author={Lee, Ching-Jui and Yeh, Tsung Tai},
  journal={ACM Transactions on Architecture and Code Optimization},
  year={2024},
  publisher={ACM New York, NY}
}
@article{qararyah2024efficient,
  title={An Efficient Hybrid Deep Learning Accelerator for Compact and Heterogeneous CNNs},
  author={Qararyah, Fareed and Azhar, Muhammad Waqar and Trancoso, Pedro},
  journal={ACM Transactions on Architecture and Code Optimization},
  volume={21},
  number={2},
  pages={1--26},
  year={2024},
  publisher={ACM New York, NY}
}
@article{susskind2023uleen,
  title={ULEEN: A Novel Architecture for Ultra-low-energy Edge Neural Networks},
  author={Susskind, Zachary and Arora, Aman and Miranda, Igor DS and Bacellar, Alan TL and Villon, Luis AQ and Katopodis, Rafael F and de Ara{\'u}jo, Leandro S and Dutra, Diego LC and Lima, Priscila MV and Fran{\c{c}}a, Felipe MG and others},
  journal={ACM Transactions on Architecture and Code Optimization},
  volume={20},
  number={4},
  pages={1--24},
  year={2023},
  publisher={ACM New York, NY}
}
@article{yu2023multiply,
  title={Multiply-and-Fire: An Event-Driven Sparse Neural Network Accelerator},
  author={Yu, Miao and Xiang, Tingting and Miriyala, Venkata Pavan Kumar and Carlson, Trevor E},
  journal={ACM Transactions on Architecture and Code Optimization},
  volume={20},
  number={4},
  pages={1--26},
  year={2023},
  publisher={ACM New York, NY}
}
